@MISC{WTX,
	Title={Government Data Set},
	howpublished={\url{http://acsys.anu.edu.au/}},
	year = {2000}
}

@article{greenwade93,
    author  = "George D. Greenwade",
    title   = "The {C}omprehensive {T}ex {A}rchive {N}etwork ({CTAN})",
    year    = "1993",
    journal = "TUGBoat",
    volume  = "14",
    number  = "3",
    pages   = "342--351"
}

@MISC{WEBSPAM-UK2007,
	title = {Yahoo! Research: Web Spam Collections},
	howpublished = {\url{http://www.yr-bcn.es/webspam/datasets/uk2007/}},
	year = {2007}
}

@ARTICLE{Porter,
	AUTHOR={C.J. van Rijsbergen, S.E. Robertson and M.F. Porter},
	TITLE={New models in probabilistic information retrieval},
	JOURNAL={British Library Research and Development Report},
	YEAR = {1980},
	NUMBER={5587}
}
@MISC{Common,
	TITLE = {The Most Common English Words},
	HOWPUBLISHED={\url{http://www.world-english.org/english500.htm}},
	YEAR = {2009}
}

@InProceedings{kruegel03:webanomaly,
  author = 	 {C. Kruegel and G. Vigna},
  title = 	 {{Anomaly Detection of Web-based Attacks}},
  booktitle =	 {Proceedings of the $10^{th}$ ACM Conference on Computer and Communication Security (CCS '03)},
  year =	 2003,
  address =	 {Washington, DC},
  pages =	 {251--261},
  month =	 {October},
  publisher =	 {ACM Press}
}

	
